{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 数据目标\n",
    "1. 下载pdf\n",
    "2. 解决验证码问题\n",
    "3. 可视化分析"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [],
   "source": [
    "from selenium import webdriver\n",
    "import  time \n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [],
   "source": [
    "from selenium.webdriver.common.desired_capabilities import DesiredCapabilities\n",
    "\n",
    "\n",
    "#caps=dict()\n",
    "#caps[\"pageLoadStrategy\"] = \"none\"   # Do not wait for full page load\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')#解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') #指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') #谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') #隐藏滚动条, 应对些特殊页面\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-33-948c993d96ba>:5: DeprecationWarning: use options instead of chrome_options\n",
      "  driver = webdriver.Chrome(executable_path=r'C:\\Program Files (x86)\\Google\\Chrome\\Application\\chromedriver.exe', chrome_options=options)\n"
     ]
    }
   ],
   "source": [
    "options = webdriver.ChromeOptions()\n",
    "out_path = r'D:\\CNKI\\PDF文章'  # 是你想指定的路径\n",
    "prefs = {'profile.default_content_settings.popups': 0, 'download.default_directory': out_path}\n",
    "options.add_experimental_option('prefs', prefs)\n",
    "driver = webdriver.Chrome(executable_path=r'C:\\Program Files (x86)\\Google\\Chrome\\Application\\chromedriver.exe', chrome_options=options)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.get('https://www.cnki.net/')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 登录"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'中山大学南...'"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.find_element_by_id(\"Ecp_loginShowName1\").get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 高级检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.find_element_by_xpath('//*[@id=\"highSearch\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['CDwindow-22DB092F568C9522BC0E3D6842508ED9', 'CDwindow-F95F3D86ABCBFE06C1D00981E9E843A7']\n"
     ]
    }
   ],
   "source": [
    "print (driver.window_handles)\n",
    "driver.switch_to.window(driver.window_handles[-1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_xpath('/html/body/div[3]/div[1]/div/ul[1]/li[1]/a/span')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 专业检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_xpath('/html/body/div[2]/div/div[2]/ul/li[4]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 关键词输入并检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_xpath('/html/body/div[2]/div/div[2]/div/div[1]/div[1]/div[2]/textarea')\n",
    "element.clear()\n",
    "element.send_keys(' SU=“大数据\" AND SU=“网络”')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 检索\n",
    "element=driver.find_element_by_xpath('/html/body/div[2]/div/div[2]/div/div[1]/div[1]/div[2]/div[2]/input')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 统计文章数量"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'4,604'"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.find_element_by_xpath('//*[@id=\"countPageDiv\"]/span[1]/em').get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "###  更换为显示50篇"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "element=driver.find_element_by_xpath('//*[@id=\"perPageDiv\"]/div/i')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//div[@id=\"perPageDiv\"]//li[@data-val=\"50\"]/a').click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 抓取页面信息"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>基于网络大数据的大学生自杀风险主动识别与及时干预</td>\n",
       "      <td>刘爱楼</td>\n",
       "      <td>佳木斯职业学院学报</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>网络大数据信用风险评分能有效预测信贷违约风险吗？</td>\n",
       "      <td>李焱文; 蒋文华; 王纯洁</td>\n",
       "      <td>经济问题</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>119.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>大数据时代计算机网络信息安全研究——评《网络安全态势感知:提取、理解和预测》</td>\n",
       "      <td>周晶波</td>\n",
       "      <td>安全与环境学报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>大数据时代人工智能在计算机网络技术中的运用</td>\n",
       "      <td>任思颖</td>\n",
       "      <td>科技经济导刊</td>\n",
       "      <td>2021-06-18</td>\n",
       "      <td>NaN</td>\n",
       "      <td>245.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>大数据时代下计算机网络信息安全问题的探讨与防范</td>\n",
       "      <td>刘付桂兰</td>\n",
       "      <td>科技经济导刊</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>408.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>基于大数据的电力信息系统网络安全分析</td>\n",
       "      <td>李秉裕; 王佳宝; 樊科; 姚勇志</td>\n",
       "      <td>电子世界</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>基于大数据时代的计算机网络安全技术应用分析</td>\n",
       "      <td>唐培全; 戴小佳</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-06-11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>698.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>大数据下的计算机网络信息安全分析</td>\n",
       "      <td>付蓉</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-06-11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>693.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>大数据时代计算机网络技术在信息化管理中的应用</td>\n",
       "      <td>杨远正</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-06-11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>206.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>大数据背景下计算机网络安全防范措施探析</td>\n",
       "      <td>傅望</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-06-11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>160.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>大数据系统推介下的网络消费异化：表征、溯因及消解</td>\n",
       "      <td>马会端</td>\n",
       "      <td>河南师范大学学报(哲学社会科学版)</td>\n",
       "      <td>2021-06-09 13:41</td>\n",
       "      <td>NaN</td>\n",
       "      <td>239.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>大数据分析助力银行网络运维转型发展</td>\n",
       "      <td>孔浩; 刘彬</td>\n",
       "      <td>中国金融电脑</td>\n",
       "      <td>2021-06-07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>70.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>大数据背景下计算机网络安全防范措施研究</td>\n",
       "      <td>李震乾</td>\n",
       "      <td>科技与创新</td>\n",
       "      <td>2021-06-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>25.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>大数据时代计算机远程网络通信技术的应用研究</td>\n",
       "      <td>黄晓平</td>\n",
       "      <td>科学咨询(科技·管理)</td>\n",
       "      <td>2021-06-04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>大数据背景下的网络信息安全控制策略分析</td>\n",
       "      <td>武燕平</td>\n",
       "      <td>产业与科技论坛</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>计算机网络中大数据与人工智能技术的应用</td>\n",
       "      <td>许妙水</td>\n",
       "      <td>计算机与网络</td>\n",
       "      <td>2021-05-26</td>\n",
       "      <td>NaN</td>\n",
       "      <td>26.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>大数据时代的计算机网络安全防范策略</td>\n",
       "      <td>马颖</td>\n",
       "      <td>计算机与网络</td>\n",
       "      <td>2021-05-26</td>\n",
       "      <td>NaN</td>\n",
       "      <td>14.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>智能网络下职业健康风险大数据分析方法</td>\n",
       "      <td>刘博; 邓舒平; 杨楠; 郑继辉; 谢金龙</td>\n",
       "      <td>信息技术</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>99.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>大数据环境下的网络考试平台的开发及应用研究</td>\n",
       "      <td>陈辉彬</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>13.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>大数据技术在网络入侵检测的应用</td>\n",
       "      <td>李新新</td>\n",
       "      <td>信息技术与信息化</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>74.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>简析大数据背景下信息通信网络安全管理策略</td>\n",
       "      <td>李鹏举</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>4.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>大数据背景下计算机信息技术在网络安全中的运用探析</td>\n",
       "      <td>格桑次仁</td>\n",
       "      <td>数字技术与应用</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>大数据背景下网络营销对策</td>\n",
       "      <td>郑昕</td>\n",
       "      <td>营销界</td>\n",
       "      <td>2021-05-21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>298.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>基于卷积神经网络的健康大数据智能分析方法研究</td>\n",
       "      <td>白贺伊</td>\n",
       "      <td>电子设计工程</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>211.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>大数据与计算机网络的信息安全策略分析</td>\n",
       "      <td>李培培</td>\n",
       "      <td>电子技术</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>417.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>大数据样本与半监督环境下基于生成对抗网络的故障诊断</td>\n",
       "      <td>潘继财</td>\n",
       "      <td>机械与电子</td>\n",
       "      <td>2021-05-19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>94.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>企业网络、大数据能力与商业模式创新机制研究——基于fs QCA方法的实证分析  网络首发</td>\n",
       "      <td>李文; 张珍珍; 梅蕾</td>\n",
       "      <td>科技进步与对策</td>\n",
       "      <td>2021-05-18 15:15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>557.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>基于大数据的计算机网络信息安全防护措施研究</td>\n",
       "      <td>曹仰之</td>\n",
       "      <td>电脑编程技巧与维护</td>\n",
       "      <td>2021-05-18</td>\n",
       "      <td>NaN</td>\n",
       "      <td>251.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>大数据背景下高校网络思想政治教育的安全风险对策研究</td>\n",
       "      <td>莫靖聪</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>214.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>探讨大数据视域下的高校网络安全课程教学改革创新</td>\n",
       "      <td>张玲玲</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>103.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>人工智能及大数据的网络安全态势感知研究</td>\n",
       "      <td>王晓娜; 李晓宇; 李芙蓉</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>502.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>大数据时代的网络黑客攻击与防范治理</td>\n",
       "      <td>董颖</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>345.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>大数据时代计算机网络信息安全研究</td>\n",
       "      <td>席攀锋</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1072.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>大数据背景下计算机网络信息安全探究</td>\n",
       "      <td>马天午</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>388.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>基于大数据时代下的计算机网络安全研究</td>\n",
       "      <td>陈亚科</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>170.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>大数据背景下网络信息安全技术体系分析</td>\n",
       "      <td>童瀛; 姚焕章; 周宇</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>670.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>大数据系统中的计算机网络安全技术</td>\n",
       "      <td>郑志荣</td>\n",
       "      <td>网络安全技术与应用</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>247.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>广电总局制定网络视听收视大数据行业标准播放数据将有统一标准</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国有线电视</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>10.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>大数据时代计算机网络信息安全及防护策略探究</td>\n",
       "      <td>陈伟</td>\n",
       "      <td>电子世界</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>173.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>大数据时代人工智能在计算机网络技术中的应用研究</td>\n",
       "      <td>郁陶</td>\n",
       "      <td>电子世界</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>163.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>基于大数据的网络舆情多维动态分类研究</td>\n",
       "      <td>高慧</td>\n",
       "      <td>电脑知识与技术</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>22.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>基于大数据技术的网络热搜关键词提取算法</td>\n",
       "      <td>王珊珊; 梁同乐</td>\n",
       "      <td>电子测试</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>基于大数据时代人工智能在计算机网络技术中的应用</td>\n",
       "      <td>李晓霞</td>\n",
       "      <td>电子测试</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>47.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>大数据技术在通信网络中的应用</td>\n",
       "      <td>毛莉艳</td>\n",
       "      <td>电子技术与软件工程</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>22.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>计算机大数据分析与云计算网络技术应用研究</td>\n",
       "      <td>王玲玲</td>\n",
       "      <td>电子技术与软件工程</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>65.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>县市台大数据网络融媒体应用研究</td>\n",
       "      <td>李晓磊; 李志辉</td>\n",
       "      <td>影视制作</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>县市级大数据网络融媒体平台应用研究</td>\n",
       "      <td>李晓磊; 赵宇</td>\n",
       "      <td>广播与电视技术</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>基于大数据的计算机网络数据库安全技术</td>\n",
       "      <td>马颖</td>\n",
       "      <td>计算机与网络</td>\n",
       "      <td>2021-05-12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>52.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>基于网格化和大数据的移动网络覆盖质量评估方法研究</td>\n",
       "      <td>李智峰</td>\n",
       "      <td>无线互联科技</td>\n",
       "      <td>2021-05-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>大数据支持下网络谣言智慧治理研究</td>\n",
       "      <td>张鑫</td>\n",
       "      <td>合作经济与科技</td>\n",
       "      <td>2021-05-07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>222.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                            篇名  \\\n",
       "0            1                      基于网络大数据的大学生自杀风险主动识别与及时干预   \n",
       "1            2                      网络大数据信用风险评分能有效预测信贷违约风险吗？   \n",
       "2            3        大数据时代计算机网络信息安全研究——评《网络安全态势感知:提取、理解和预测》   \n",
       "3            4                         大数据时代人工智能在计算机网络技术中的运用   \n",
       "4            5                       大数据时代下计算机网络信息安全问题的探讨与防范   \n",
       "5            6                            基于大数据的电力信息系统网络安全分析   \n",
       "6            7                         基于大数据时代的计算机网络安全技术应用分析   \n",
       "7            8                              大数据下的计算机网络信息安全分析   \n",
       "8            9                        大数据时代计算机网络技术在信息化管理中的应用   \n",
       "9           10                           大数据背景下计算机网络安全防范措施探析   \n",
       "10          11                      大数据系统推介下的网络消费异化：表征、溯因及消解   \n",
       "11          12                             大数据分析助力银行网络运维转型发展   \n",
       "12          13                           大数据背景下计算机网络安全防范措施研究   \n",
       "13          14                         大数据时代计算机远程网络通信技术的应用研究   \n",
       "14          15                           大数据背景下的网络信息安全控制策略分析   \n",
       "15          16                           计算机网络中大数据与人工智能技术的应用   \n",
       "16          17                             大数据时代的计算机网络安全防范策略   \n",
       "17          18                            智能网络下职业健康风险大数据分析方法   \n",
       "18          19                         大数据环境下的网络考试平台的开发及应用研究   \n",
       "19          20                               大数据技术在网络入侵检测的应用   \n",
       "20          21                          简析大数据背景下信息通信网络安全管理策略   \n",
       "21          22                      大数据背景下计算机信息技术在网络安全中的运用探析   \n",
       "22          23                                  大数据背景下网络营销对策   \n",
       "23          24                        基于卷积神经网络的健康大数据智能分析方法研究   \n",
       "24          25                            大数据与计算机网络的信息安全策略分析   \n",
       "25          26                     大数据样本与半监督环境下基于生成对抗网络的故障诊断   \n",
       "26          27  企业网络、大数据能力与商业模式创新机制研究——基于fs QCA方法的实证分析  网络首发   \n",
       "27          28                         基于大数据的计算机网络信息安全防护措施研究   \n",
       "28          29                     大数据背景下高校网络思想政治教育的安全风险对策研究   \n",
       "29          30                       探讨大数据视域下的高校网络安全课程教学改革创新   \n",
       "30          31                           人工智能及大数据的网络安全态势感知研究   \n",
       "31          32                             大数据时代的网络黑客攻击与防范治理   \n",
       "32          33                              大数据时代计算机网络信息安全研究   \n",
       "33          34                             大数据背景下计算机网络信息安全探究   \n",
       "34          35                            基于大数据时代下的计算机网络安全研究   \n",
       "35          36                            大数据背景下网络信息安全技术体系分析   \n",
       "36          37                              大数据系统中的计算机网络安全技术   \n",
       "37          38                 广电总局制定网络视听收视大数据行业标准播放数据将有统一标准   \n",
       "38          39                         大数据时代计算机网络信息安全及防护策略探究   \n",
       "39          40                       大数据时代人工智能在计算机网络技术中的应用研究   \n",
       "40          41                            基于大数据的网络舆情多维动态分类研究   \n",
       "41          42                           基于大数据技术的网络热搜关键词提取算法   \n",
       "42          43                       基于大数据时代人工智能在计算机网络技术中的应用   \n",
       "43          44                                大数据技术在通信网络中的应用   \n",
       "44          45                          计算机大数据分析与云计算网络技术应用研究   \n",
       "45          46                               县市台大数据网络融媒体应用研究   \n",
       "46          47                             县市级大数据网络融媒体平台应用研究   \n",
       "47          48                            基于大数据的计算机网络数据库安全技术   \n",
       "48          49                      基于网格化和大数据的移动网络覆盖质量评估方法研究   \n",
       "49          50                              大数据支持下网络谣言智慧治理研究   \n",
       "\n",
       "                       作者                 刊名              发表时间  被引      下载  操作  \n",
       "0                     刘爱楼          佳木斯职业学院学报        2021-06-30 NaN     NaN  下载  \n",
       "1           李焱文; 蒋文华; 王纯洁               经济问题        2021-06-25 NaN   119.0  下载  \n",
       "2                     周晶波            安全与环境学报        2021-06-25 NaN     NaN  下载  \n",
       "3                     任思颖             科技经济导刊        2021-06-18 NaN   245.0  下载  \n",
       "4                    刘付桂兰             科技经济导刊        2021-06-15 NaN   408.0  下载  \n",
       "5       李秉裕; 王佳宝; 樊科; 姚勇志               电子世界        2021-06-15 NaN     NaN  下载  \n",
       "6                唐培全; 戴小佳          网络安全技术与应用        2021-06-11 NaN   698.0  下载  \n",
       "7                      付蓉          网络安全技术与应用        2021-06-11 NaN   693.0  下载  \n",
       "8                     杨远正          网络安全技术与应用        2021-06-11 NaN   206.0  下载  \n",
       "9                      傅望          网络安全技术与应用        2021-06-11 NaN   160.0  下载  \n",
       "10                    马会端  河南师范大学学报(哲学社会科学版)  2021-06-09 13:41 NaN   239.0  下载  \n",
       "11                 孔浩; 刘彬             中国金融电脑        2021-06-07 NaN    70.0  下载  \n",
       "12                    李震乾              科技与创新        2021-06-05 NaN    25.0  下载  \n",
       "13                    黄晓平        科学咨询(科技·管理)        2021-06-04 NaN    58.0  下载  \n",
       "14                    武燕平            产业与科技论坛        2021-06-01 NaN    20.0  下载  \n",
       "15                    许妙水             计算机与网络        2021-05-26 NaN    26.0  下载  \n",
       "16                     马颖             计算机与网络        2021-05-26 NaN    14.0  下载  \n",
       "17  刘博; 邓舒平; 杨楠; 郑继辉; 谢金龙               信息技术        2021-05-25 NaN    99.0  下载  \n",
       "18                    陈辉彬            电脑知识与技术        2021-05-25 NaN    13.0  下载  \n",
       "19                    李新新           信息技术与信息化        2021-05-25 NaN    74.0  下载  \n",
       "20                    李鹏举            数字技术与应用        2021-05-25 NaN     4.0  下载  \n",
       "21                   格桑次仁            数字技术与应用        2021-05-25 NaN     3.0  下载  \n",
       "22                     郑昕                营销界        2021-05-21 NaN   298.0  下载  \n",
       "23                    白贺伊             电子设计工程        2021-05-20 NaN   211.0  下载  \n",
       "24                    李培培               电子技术        2021-05-20 NaN   417.0  下载  \n",
       "25                    潘继财              机械与电子        2021-05-19 NaN    94.0  下载  \n",
       "26            李文; 张珍珍; 梅蕾            科技进步与对策  2021-05-18 15:15 NaN   557.0  下载  \n",
       "27                    曹仰之          电脑编程技巧与维护        2021-05-18 NaN   251.0  下载  \n",
       "28                    莫靖聪          网络安全技术与应用        2021-05-15 NaN   214.0  下载  \n",
       "29                    张玲玲          网络安全技术与应用        2021-05-15 NaN   103.0  下载  \n",
       "30          王晓娜; 李晓宇; 李芙蓉          网络安全技术与应用        2021-05-15 NaN   502.0  下载  \n",
       "31                     董颖          网络安全技术与应用        2021-05-15 NaN   345.0  下载  \n",
       "32                    席攀锋          网络安全技术与应用        2021-05-15 NaN  1072.0  下载  \n",
       "33                    马天午          网络安全技术与应用        2021-05-15 NaN   388.0  下载  \n",
       "34                    陈亚科          网络安全技术与应用        2021-05-15 NaN   170.0  下载  \n",
       "35            童瀛; 姚焕章; 周宇          网络安全技术与应用        2021-05-15 NaN   670.0  下载  \n",
       "36                    郑志荣          网络安全技术与应用        2021-05-15 NaN   247.0  下载  \n",
       "37                    NaN             中国有线电视        2021-05-15 NaN    10.0  下载  \n",
       "38                     陈伟               电子世界        2021-05-15 NaN   173.0  下载  \n",
       "39                     郁陶               电子世界        2021-05-15 NaN   163.0  下载  \n",
       "40                     高慧            电脑知识与技术        2021-05-15 NaN    22.0  下载  \n",
       "41               王珊珊; 梁同乐               电子测试        2021-05-15 NaN    24.0  下载  \n",
       "42                    李晓霞               电子测试        2021-05-15 NaN    47.0  下载  \n",
       "43                    毛莉艳          电子技术与软件工程        2021-05-15 NaN    22.0  下载  \n",
       "44                    王玲玲          电子技术与软件工程        2021-05-15 NaN    65.0  下载  \n",
       "45               李晓磊; 李志辉               影视制作        2021-05-15 NaN     2.0  下载  \n",
       "46                李晓磊; 赵宇            广播与电视技术        2021-05-15 NaN     6.0  下载  \n",
       "47                     马颖             计算机与网络        2021-05-12 NaN    52.0  下载  \n",
       "48                    李智峰             无线互联科技        2021-05-10 NaN     NaN  下载  \n",
       "49                     张鑫            合作经济与科技        2021-05-07 NaN   222.0  下载  "
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element=driver.find_element_by_id('gridTable')\n",
    "data_html=element.get_attribute('innerHTML')\n",
    "pd.read_html(data_html)[0]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 爬取文章信息"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [],
   "source": [
    "# driver.switch_to.frame()\n",
    "from lxml import etree\n",
    "import re\n",
    "import requests\n",
    "from urllib.parse import urljoin\n",
    "HOST = \"https://kns.cnki.net/\"\n",
    "html = driver.page_source\n",
    "soup = etree.HTML(html)\n",
    "tr_list= soup.xpath('//div[@id=\"gridTable\"]/table/tbody/tr')\n",
    "headers = {\n",
    "    \"Cookie\":'Ecp_ClientId=3200615112602316607; cnkiUserKey=03369524-5653-0508-82c6-2fdbcdb21fe4; RsPerPage=20; _pk_ref=%5B%22%22%2C%22%22%2C1607047617%2C%22https%3A%2F%2Fwww.cnki.net%2F%22%5D; Ecp_ClientIp=202.116.81.140; UM_distinctid=178689abc586d3-0e68ae30691535-5771133-1fa400-178689abc597f5; Ecp_loginuserjf=15014134753; Ecp_session=1; ASP.NET_SessionId=gt3afeursglwft12mavvuvzf; SID_kns8=123111; SID_kns_new=kns123106; CurrSortFieldType=desc; SID_kcms=124103; SID_kxreader_new=011121; Hm_lvt_6e967eb120601ea41b9d312166416aa6=1621474773; sensorsdata2015jssdkcross=%7B%22distinct_id%22%3A%22179876d894d472-0e2dc24144c1fc-2363163-2073600-179876d894e760%22%2C%22first_id%22%3A%22%22%2C%22props%22%3A%7B%7D%2C%22%24device_id%22%3A%22179876d894d472-0e2dc24144c1fc-2363163-2073600-179876d894e760%22%7D; Hm_lvt_ba7af201fc75865e9846f701ccb53e6b=1621474773; SID_kns=025123113; SID_klogin=125144; Hm_lpvt_6e967eb120601ea41b9d312166416aa6=1621475961; Hm_lpvt_ba7af201fc75865e9846f701ccb53e6b=1621475961; Ecp_loginuserbk=GDZSDX; knsLeftGroupSelectItem=null5%3B9%3B; CurrSortField=%e8%a2%ab%e5%bc%95%2f(%e8%a2%ab%e5%bc%95%e9%a2%91%e6%ac%a1%2c%27integer%27); _pk_ref=%5B%22%22%2C%22%22%2C1622444666%2C%22https%3A%2F%2Fwww.cnki.net%2F%22%5D; _pk_ses=*; _pk_id=90adc29b-dc70-48ff-8dcc-60e442d5a980.1619271339.5.1622444668.1622444666.; Ecp_LoginStuts={\"IsAutoLogin\":false,\"UserName\":\"GZ0513\",\"ShowName\":\"%e4%b8%ad%e5%b1%b1%e5%a4%a7%e5%ad%a6%e5%8d%97%e6%96%b9%e5%ad%a6%e9%99%a2\",\"UserType\":\"bk\",\"BUserName\":\"\",\"BShowName\":\"\",\"BUserType\":\"\",\"r\":\"4SVIml\"}; LID=WEEvREcwSlJHSldSdmVqM1BLVW9SQVdSTUtBeko5WUtLcE8xUldvbWhxRT0=$9A4hF_YAuvQ5obgVAqNKPCYcEjKensW4IQMovwHtwkF4VYPoHbKxJw!!; c_m_LinID=LinID=WEEvREcwSlJHSldSdmVqM1BLVW9SQVdSTUtBeko5WUtLcE8xUldvbWhxRT0=$9A4hF_YAuvQ5obgVAqNKPCYcEjKensW4IQMovwHtwkF4VYPoHbKxJw!!&ot=05/31/2021 15:24:33; c_m_expire=2021-05-31 15:24:33',\n",
    "    'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.212 Safari/537.36'\n",
    "}\n",
    "def get_data(href):\n",
    "    DbCode = re.findall(\"DbCode=(.*?)&\",href)[0]\n",
    "    dbname = re.findall(\"dbname=(.*?)&\",href)[0]\n",
    "    filename = re.findall(\"filename=(.*?)&\",href)[0]\n",
    "    href = f\"https://kns.cnki.net/kcms/detail/detail.aspx?dbcode={DbCode}&dbname={dbname}&filename={filename}\"\n",
    "    return href\n",
    "\n",
    "def download(href):\n",
    "    page_source = requests.get(url=href,headers=headers).text\n",
    "    page_source_soup = etree.HTML(page_source)\n",
    "    download_url = page_source_soup.xpath('//li[@class=\"btn-dlpdf\"]/a/@href')\n",
    "    if download_url:\n",
    "        return urljoin(HOST,download_url[0])\n",
    "    else:\n",
    "        return \"没有下载链接\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [],
   "source": [
    "def downloader(title,href):\n",
    "    status_code = requests.get(href,headers=headers)\n",
    "    if status_code == 200:\n",
    "        contends = status_code.content\n",
    "        with open(f\"{title}.pdf\",\"wb\") as fp:\n",
    "            fp.wirte(contents)\n",
    "        print(f\"{title}\",\"成功下载\")\n",
    "    else:\n",
    "        print(\"无法下载\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [],
   "source": [
    "num_pages = 25\n",
    "\n",
    "\n",
    "title_list = []\n",
    "author_list = []\n",
    "href_list = []\n",
    "download_url_list = []\n",
    "\n",
    "def main():\n",
    "    now_page_count = 1\n",
    "    while now_page_count < num_pages:\n",
    "        html = driver.page_source\n",
    "        try:\n",
    "            soup = etree.HTML(html)\n",
    "            tr_list= soup.xpath('//div[@id=\"gridTable\"]/table/tbody/tr')\n",
    "            for tr in tr_list:\n",
    "                title = \"\".join(tr.xpath('td[@class=\"name\"]//text()')).strip().replace(\"\\n\",\"\").replace(\"                              网络首发\",\"\")\n",
    "                author = \",\".join(tr.xpath('td[@class=\"author\"]/a//text()')).strip().replace(\"\\n\",\"\")\n",
    "                href = tr.xpath('td[@class=\"name\"]/a/@href')[0]\n",
    "                href = get_data(href)\n",
    "                download_url = download(href)\n",
    "#                 print(download_url)\n",
    "                title_list.append(title)\n",
    "                author_list.append(author)\n",
    "                href_list.append(href)\n",
    "                download_url_list.append(download_url)\n",
    "            now_page_count = now_page_count + 1\n",
    "            driver.find_element_by_xpath('//*[@id=\"PageNext\"]').click()\n",
    "            time.sleep(0.5)\n",
    "        except:\n",
    "            time.sleep(10)# 解决500多遇到验证码问题\n",
    "    data = {\"标题\":title_list,\"作者\":author_list,\"链接\":href_list,\"下载链接\":download_url_list}\n",
    "    data = pd.DataFrame(data)\n",
    "    return data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>标题</th>\n",
       "      <th>作者</th>\n",
       "      <th>链接</th>\n",
       "      <th>下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>基于网络大数据的大学生自杀风险主动识别与及时干预</td>\n",
       "      <td>刘爱楼</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>网络大数据信用风险评分能有效预测信贷违约风险吗？</td>\n",
       "      <td>李焱文,蒋文华,王纯洁</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>大数据时代计算机网络信息安全研究——评《网络安全态势感知:提取、理解和预测》</td>\n",
       "      <td>周晶波</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>大数据时代人工智能在计算机网络技术中的运用</td>\n",
       "      <td>任思颖</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>大数据时代下计算机网络信息安全问题的探讨与防范</td>\n",
       "      <td>刘付桂兰</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1195</th>\n",
       "      <td>大数据时代计算机网络信息安全及防护研究</td>\n",
       "      <td>滕飞</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1196</th>\n",
       "      <td>大数据时代的计算机网络安全及防范措施探析</td>\n",
       "      <td>汪晓睿</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1197</th>\n",
       "      <td>大数据环境下网络舆情智能预警机制研究</td>\n",
       "      <td>易臣何,何雪平</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1198</th>\n",
       "      <td>基于大数据的网络安全与情报分析研究</td>\n",
       "      <td>罗翔</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1199</th>\n",
       "      <td>大数据&amp;人工智能时代下网络安全的实践</td>\n",
       "      <td>刘树锋,陈思德,邱锋兴</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1200 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                          标题           作者  \\\n",
       "0                   基于网络大数据的大学生自杀风险主动识别与及时干预          刘爱楼   \n",
       "1                   网络大数据信用风险评分能有效预测信贷违约风险吗？  李焱文,蒋文华,王纯洁   \n",
       "2     大数据时代计算机网络信息安全研究——评《网络安全态势感知:提取、理解和预测》          周晶波   \n",
       "3                      大数据时代人工智能在计算机网络技术中的运用          任思颖   \n",
       "4                    大数据时代下计算机网络信息安全问题的探讨与防范         刘付桂兰   \n",
       "...                                      ...          ...   \n",
       "1195                     大数据时代计算机网络信息安全及防护研究           滕飞   \n",
       "1196                    大数据时代的计算机网络安全及防范措施探析          汪晓睿   \n",
       "1197                      大数据环境下网络舆情智能预警机制研究      易臣何,何雪平   \n",
       "1198                       基于大数据的网络安全与情报分析研究           罗翔   \n",
       "1199                      大数据&人工智能时代下网络安全的实践  刘树锋,陈思德,邱锋兴   \n",
       "\n",
       "                                                     链接  \\\n",
       "0     https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1     https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2     https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3     https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4     https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "...                                                 ...   \n",
       "1195  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1196  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1197  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1198  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1199  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                                   下载链接  \n",
       "0     https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1     https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2     https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3     https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4     https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "...                                                 ...  \n",
       "1195  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1196  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1197  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1198  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1199  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[1200 rows x 4 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "data = main()\n",
    "display(data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [],
   "source": [
    "data.to_excel('CNKI_数据挖掘.xlsx',sheet_name=\"文章\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 调用API"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [],
   "source": [
    "import re\n",
    "from urllib.parse import urljoin\n",
    "from uuid import uuid4\n",
    "import requests\n",
    "import base64\n",
    "from PIL  import Image"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [],
   "source": [
    "def base64_api(uname, pwd, img, typeid):\n",
    "    with open(img, 'rb') as f:\n",
    "        base64_data = base64.b64encode(f.read())\n",
    "        b64 = base64_data.decode()\n",
    "    data = {\"username\": uname, \"password\": pwd, \"typeid\": typeid, \"image\": b64}\n",
    "    result = json.loads(requests.post(\"http://api.ttshitu.com/predict\", json=data).text)\n",
    "    if result['success']:\n",
    "        return result[\"data\"][\"result\"]\n",
    "    else:\n",
    "        return result[\"message\"]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [],
   "source": [
    "def cut_picture(picture_path):\n",
    "    srcPath = picture_path+\".jpg\"\n",
    "    dstPath = picture_path+\".png\"\n",
    "\n",
    "    # 读取图片\n",
    "    img_1 = Image.open(srcPath)\n",
    "    # 设置裁剪的位置\n",
    "    crop_box = (486,354,750,415)\n",
    "    # 裁剪图片\n",
    "    img_2 = img_1.crop(crop_box)\n",
    "    img_2.save(dstPath)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 下载为pdf"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "“校园欺凌”的网络表达与治理——基于LDA主题模型的大数据分析----下载成功\n",
      "大数据时代人工智能在网络技术中的应用研究----下载成功\n",
      "基于大数据时代下的网络安全问题探析----下载成功\n",
      "大数据在突发事件网络舆情分析中的应用----下载成功\n",
      "大数据背景下信息通信网络安全管理策略研究----下载成功\n",
      "大数据时代背景下企业网络精准营销的策略探索----下载成功\n",
      "大数据背景下计算机网络信息安全风险和解决对策研究----下载成功\n",
      "基于大数据背景下人工智能在计算机网络技术中的应用----下载成功\n",
      "大数据背景下计算机远程网络通信技术变革探究----下载成功\n",
      "大数据时代计算机网络安全防范探析----下载成功\n",
      "大数据背景下计算机网络信息安全问题分析----下载成功\n",
      "大数据技术在5G通信网络中的应用研究----下载成功\n",
      "基于大数据信息网络的毕业生就业创业指导工作应用研究----下载成功\n",
      "大数据时代计算机网络安全系统设计----下载成功\n",
      "云计算在计算机网络安全存储中的应用——评《云存储安全：大数据分析与计算的基石》----下载成功\n",
      "基于大数据分析的高职网络教学质量评价系统研究----下载成功\n",
      "大数据时代下计算机网络安全防御系统设计与实现分析----下载成功\n",
      "乡村旅游地网络口碑的大数据分析——以南通洲际绿博园为例----下载成功\n",
      "地方政府大数据治理政策的注意力变迁——基于政策文本的扎根理论与社会网络分析----下载成功\n",
      "高校就业网络信息系统大数据平台的架构与安全设计----下载成功\n",
      "大数据时代人工智能在计算机网络技术中的应用----下载成功\n",
      "基于大数据背景的医院网络信息安全防范分析----下载成功\n",
      "大数据背景下基于网络搜索数据商品零售价格指数预测研究----下载成功\n",
      "基于中间件技术的网络处理器气候大数据多级存储系统----下载成功\n",
      "基于大数据与网络态势感知的网站安全管理研究----下载成功\n",
      "浅谈大数据时代的计算机网络安全及防范----下载成功\n",
      "大数据背景下网络信息安全技术体系分析----下载成功\n",
      "大数据时代计算机网络安全及防范措施研究----下载成功\n",
      "大数据背景下的计算机网络信息安全分析----下载成功\n",
      "大数据和云计算环境下网络安全分析与解决方案研究----下载成功\n",
      "基于大数据的并行化深度卷积神经网络优化算法----下载成功\n",
      "刍议大数据时代的计算机网络安全和防范策略----下载成功\n",
      "大数据背景下计算机网络信息安全探究----下载成功\n",
      "大数据赋能下网络借贷的价值共创模式研究——来自Lending Club的证据----下载成功\n",
      "5G通信网络对大数据技术的发展与促进----下载成功\n",
      "网络安全分析中的大数据技术研究----下载成功\n",
      "基于大数据的校园网络安全研究----下载成功\n",
      "大数据时代人工智能在计算机网络技术中的应用----下载成功\n",
      "云计算与大数据技术在广电有线网络中的应用----下载成功\n",
      "探究大数据时代计算机网络信息安全问题----下载成功\n",
      "大数据时代背景下计算机网络安全防范应用与运行分析----下载成功\n",
      "大数据时代计算机网络信息安全及防护探讨----下载成功\n",
      "大数据时代成人高校网络安全研究----下载成功\n",
      "筑牢大数据时代网络安全防线  为数字经济健康发展保驾护航——山东华软金盾软件股份有限公司高级副总裁张树强----下载成功\n",
      "高校学生网络舆情管理应对路径探究——评《高校学生网络话语与网络舆情引导研究——基于“大数据”的视域》----下载成功\n",
      "大数据时代食品行业网络营销发展----下载成功\n",
      "大数据下的校园无线网络优化----下载成功\n",
      "大数据背景下宽带网络维护系统架构的探究----下载成功\n",
      "网络安全分析中的大数据技术应用分析----下载成功\n"
     ]
    }
   ],
   "source": [
    "data = pd.read_excel(\"CNKI_数据挖掘.xlsx\")\n",
    "base = \"https://kns.cnki.net/\"\n",
    "count = 451\n",
    "end_count = 500\n",
    "title_list = data[\"标题\"].to_list()[count:end_count]\n",
    "download_url_list = data[\"链接\"].to_list()[count:end_count]\n",
    "for title,download_url in zip(title_list,download_url_list):\n",
    "    try:\n",
    "        driver.get(download_url)\n",
    "        time.sleep(1.5)\n",
    "        js = 'document.getElementById(\"pdfDown\").setAttribute(\"target\",\"\");'\n",
    "        driver.execute_script(js)\n",
    "        time.sleep(1.5)\n",
    "        driver.find_element_by_xpath('//li[@class=\"btn-dlpdf\"]').click()\n",
    "        time.sleep(1.5)\n",
    "        source = driver.page_source\n",
    "        if \"安全验证\" in source: # 如果需要验证码，则调用api\n",
    "            print(\"已经进入验证码阶段\")\n",
    "            time.sleep(2)\n",
    "            url_path = re.findall('<dt><img id=\"vImg\" src=\"(.*?)\" alt=\"验证码\" title=\"点击切换验证码\"></dt>',source)[0] # 取出图片url\n",
    "            picture_url = urljoin(base,url_path)\n",
    "            content = requests.get(picture_url).content\n",
    "            picture_name = f\"./code/{uuid4()}\"\n",
    "            driver.get_screenshot_as_file(picture_name+\".jpg\")\n",
    "            cut_picture(picture_name)\n",
    "            \n",
    "            result = base64_api(uname='Crisp', pwd='Crisp0820', img=picture_name+\".png\", typeid=3)\n",
    "            print(\"识别结果为：\",result) # 识别出的图片结果\n",
    "            driver.find_element_by_id('vcode').send_keys(result) # 将图片结果填入\n",
    "            time.sleep(5)\n",
    "            driver.find_element_by_xpath('/html/body/div/form/dl/dd/button').click() # 点击提交进行下载\n",
    "            print(f'{title}----下载成功')\n",
    "        else: # 没有弹出验证码\n",
    "            print(f'{title}----下载成功')\n",
    "    except Exception as e:\n",
    "        print(e)\n",
    "        print(f'{title}----没有下载权限')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 导出refworks"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [],
   "source": [
    "next_page=driver.find_element_by_id('PageNext')\n",
    "all=driver.find_element_by_xpath('//*[@id=\"selectCheckAll1\"]')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "1"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "2"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "3"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "4"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "5"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "6"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "7"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "8"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "9"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "for i in range(0,10):\n",
    "    driver.find_element_by_xpath('//*[@id=\"selectCheckAll1\"]').click()\n",
    "    driver.find_element_by_id('PageNext').click()\n",
    "    time.sleep(5)\n",
    "    display(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [],
   "source": [
    "from selenium.webdriver.common.action_chains import ActionChains\n",
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/a')\n",
    "ActionChains(driver).move_to_element(move).perform()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {},
   "outputs": [],
   "source": [
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/a')\n",
    "ActionChains(driver).move_to_element(move).perform()\n",
    "driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/ul/li[8]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-EC67A790652F6652D697180A0DB6DF2B',\n",
       " 'CDwindow-2014911FDD4196BE0AE18AA884FB8E99',\n",
       " 'CDwindow-1A2350684C2B4E99F23192CE7A3B8B89']"
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 切换窗口\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-47-dd0a1399d54d>:1: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[-1])\n"
     ]
    }
   ],
   "source": [
    "driver.switch_to_window(driver.window_handles[-1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出\n",
    "element=driver.find_element_by_xpath('//*[@id=\"litotxt\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 刘爱楼;\\n',\n",
       " 'AD 湖北师范大学心理健康教育与咨询中心;\\n',\n",
       " 'T1 基于网络大数据的大学生自杀风险主动识别与及时干预\\n',\n",
       " 'JF 佳木斯职业学院学报\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 07\\n',\n",
       " 'vo 37\\n',\n",
       " 'OP 60-62\\n',\n",
       " 'K1 大数据;自杀风险;主动识别;及时干预;大学生\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 伴随信息时代的到来与快速发展,信息技术正在以迅猛态势渗透于社会的方方面面。大数据作为随信息时代运用而生的概念,近年来得到心理学领域的广泛关注。本文以网络大数据概念及技术视角下对高校自杀干预应用为切入点,在介绍大数据技术在危机干预中实际应用的基础上,总结其对高校危机干预理论研究和实践运用产生的影响。高校危机干预作为以个体外部表现数据为主要分析对象的工作,大数据技术能够直接提高其主动识别的精准度、增强个性化干预的效果。\\n',\n",
       " 'SN 2095-9052\\n',\n",
       " 'CN 23-1590/G4\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李焱文;蒋文华;王纯洁;\\n',\n",
       " 'AD 华南理工大学经济与金融学院;山西省文化旅游投资控股集团有限公司;\\n',\n",
       " 'T1 网络大数据信用风险评分能有效预测信贷违约风险吗？\\n',\n",
       " 'JF 经济问题\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 07\\n',\n",
       " 'OP 70-77\\n',\n",
       " 'K1 信用风险评分;网络借贷;逾期违约;大数据风控\\n',\n",
       " ' credit risk score;online lending;overdue default;big data risk control\\n',\n",
       " '\\n',\n",
       " 'AB 利用互联网个人小额消费信贷的大样本微观数据,分析借款人互联网信用风险评分与其贷款违约风险的关系。研究结果显示,基于互联网大数据的个人信用风险评分系统,无论是公司自主研发的信用评分卡,还是权威第三方研发的欺诈评分卡,均能够预测网络借款人的违约风险,网络信用风险高的借款人逾期违约率、逾期未结清率更高,需要更多次催收才能最终结清借款。除此之外,借款金额、借款次数等借款特征以及性别、年龄和户籍属性等借款人特征的作用仍不容忽视。利用人工智能和机器学习等先进技术手段更深入地分析借款人信息,完善基于互联网大数据的风控体系,对于降低网络借贷市场的风险至关重要。\\n',\n",
       " 'SN 1004-972X\\n',\n",
       " 'CN 14-1058/F\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 周晶波;\\n',\n",
       " 'AD 广西大学行健文理学院商学部;\\n',\n",
       " 'T1 大数据时代计算机网络信息安全研究——评《网络安全态势感知:提取、理解和预测》\\n',\n",
       " 'JF 安全与环境学报\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 03\\n',\n",
       " 'vo 21\\n',\n",
       " 'OP 1388\\n',\n",
       " 'K1 网络安全态势感知;安全攻击;大数据技术;大数据安全;技术模型;《网络安全态势感知:提取、理解和预测》;主动防御;信息安全研究;大数据时代;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>数据是计算机网络最主要的信息交流内容,数据信息安全关系着整个计算机网络的安全。在大数据时代,海量数据蕴含着丰富的信息,通过对海量数据进行建模分析,可以对事物发展态势进行有效预判,并提前制定应对方案。大数据技术在信息安全领域有着广泛的应用,尤其是在计算机网络安全领域,利用大数据态势感知安全技术能够构建主动防御体系,提高计算机网络安全防护水平。\\n',\n",
       " 'SN 1009-6094\\n',\n",
       " 'CN 11-4537/X\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 任思颖;\\n',\n",
       " 'AD 吉林司法警官职业学院;\\n',\n",
       " 'T1 大数据时代人工智能在计算机网络技术中的运用\\n',\n",
       " 'JF 科技经济导刊\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 19\\n',\n",
       " 'vo 29\\n',\n",
       " 'OP 1-2\\n',\n",
       " 'K1 人工智能;计算机网络技术;网络安全;网络建设\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 近年来,人们生活之中出现了很多高科技产品,人工智能在人们生活中被广泛应用。因此,在大数据时代下,对于人工智能的研究十分重要。人工智能研究的是让没有思想的机器在程序的指导下去完成一些特殊的工作,参考的是人类的基本行为。它的应用极为广泛,本文将介绍其在计算机网络技术这一方面有关网络安全的应用。\\n',\n",
       " 'SN 2096-1995\\n',\n",
       " 'CN 37-1508/N\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 刘付桂兰;\\n',\n",
       " 'AD 广东外语外贸大学;\\n',\n",
       " 'T1 大数据时代下计算机网络信息安全问题的探讨与防范\\n',\n",
       " 'JF 科技经济导刊\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 17\\n',\n",
       " 'vo 29\\n',\n",
       " 'OP 40-41\\n',\n",
       " 'K1 大数据;数据安全;信息安全\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 大数据时代下,人们的生活越来越数据信息化,社交数据化,出行数据化,财产数据化,甚至人们的生命健康也越来越数据化。生活的数据化给人们带来方便的同时,也给人们带来了很多的隐患。保护我们的信息安全,成为刻不容缓的第一要事。\\n',\n",
       " 'SN 2096-1995\\n',\n",
       " 'CN 37-1508/N\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李秉裕;王佳宝;樊科;姚勇志;\\n',\n",
       " 'AD 辽宁工业大学;\\n',\n",
       " 'T1 基于大数据的电力信息系统网络安全分析\\n',\n",
       " 'JF 电子世界\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 11\\n',\n",
       " 'OP 65-66\\n',\n",
       " 'K1 电力信息系统;安全风险;电力信息网络;网络安全分析;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>1电力信息系统网络存在的安全风险因素在目前电力行业发展过程中,由于在信息化技术的影响下,会产生很多的数据信息,特别是在目前日益先进的电力系统中,海量的电力信息数据不仅能够为整个电力系统的运行和发展带来非常重要的数据依据,在后期需要信息处理时也能够根据内部储存的海量信息提供有效的技术支持。目前在整体电力信息系统网络发展过程中依旧存在一定的安全风险,\\n',\n",
       " 'SN 1003-0522\\n',\n",
       " 'CN 11-2086/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 唐培全;戴小佳;\\n',\n",
       " 'AD 华能山东发电有限公司;华能山东发电有限公司八角电厂;\\n',\n",
       " 'T1 基于大数据时代的计算机网络安全技术应用分析\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 06\\n',\n",
       " 'OP 52-53\\n',\n",
       " 'K1 大数据时代;计算机;网络安全\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 随着社会的不断发展和进步,人类社会的和以前相比有了很多变化,人类生活和网络联系日益密切,数字化大数据时代是如今这个时代的重要标签,网络安全的重要性越来越明显。作为世界上拥有最多互联网用户和数据量的发展中国家,网络安全领域的问题对于我国是一个重要问题。本文首先介绍了大数据和网络安全的含义,分析了网络安全在中国的现状和问题,同时在文本的最后结合时代对网络安全技术的要求和需要,分析了其在大数据时代的应用,并对其在未来的发展进行了预测。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 付蓉;\\n',\n",
       " 'AD 大连理工大学城市学院;\\n',\n",
       " 'T1 大数据下的计算机网络信息安全分析\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 06\\n',\n",
       " 'OP 58-59\\n',\n",
       " 'K1 大数据时代;计算机网络信息安全;病毒查杀\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 近年来,信息技术的推广普及使得人们的生活和工作发生了深刻变化,在这个过程中,互联网的应用也催生了很多新的技术,大数据就是比较典型的一种新型科技。大数据环境下,计算机网络安全更加重要,同时也更容易受到威胁,因此必须高度重视大数据环境下的计算机网络信息安全。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 杨远正;\\n',\n",
       " 'AD 宁国人力资源和社会保障局;\\n',\n",
       " 'T1 大数据时代计算机网络技术在信息化管理中的应用\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 06\\n',\n",
       " 'OP 61-62\\n',\n",
       " 'K1 大数据时代;计算机网络技术;信息化管理\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 随着经济的发展,计算机网络技术也在不断创新和进步,被应用在人们的生产和生活中,为人们提供便利。在市场经济环境下,相关单位若想得到更好的发展,则需要合理使用计算机网络技术在信息化管理中,保证管理工作能够加速进程,提升管理效率和水平,合理配置相关资源。本文主要阐述相关单位在大数据时代信息化管理中如何使用计算机网络技术,仅供参考。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 傅望;\\n',\n",
       " 'AD 浙江警官职业学院;\\n',\n",
       " 'T1 大数据背景下计算机网络安全防范措施探析\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 06\\n',\n",
       " 'OP 153-154\\n',\n",
       " 'K1 大数据背景下;计算机网络安全;防范措施\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 随着我国社会的发展和进步,计算机网络技术飞速发展,它已经渗透到了人们生活、工作、学习、生产的各个领域和层面。大数据信息时代的到来,给计算机网络技术的发展带来了机遇,同时也使其面临着诸多挑战,计算机网络安全成为当下备受关注的问题。本文主要分析大数据背景下计算机网络安全特点以及存在的问题,并进行相关的防范措施探析,以期为解决大数据时代计算机网络安全问题提供一定的解决思路和策略。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 马会端;\\n',\n",
       " 'AD 东北大学马克思主义学院;\\n',\n",
       " 'T1 大数据系统推介下的网络消费异化：表征、溯因及消解\\n',\n",
       " 'JF 河南师范大学学报(哲学社会科学版)\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 03\\n',\n",
       " 'vo 48\\n',\n",
       " 'OP 41-47\\n',\n",
       " 'K1 大数据;网络消费;消费异化;消费行为;自由异化\\n',\n",
       " ' big data;internet consumption;consumption alienation;consumption behavior;alienation of freedom\\n',\n",
       " '\\n',\n",
       " 'AB 大数据推介系统促进了网络消费的便捷性、多样性以及普遍性。消费异化、网络消费异化、大数据推介系统以及网络消费行为自由异化之间具有内在的逻辑关联。网络消费异化是消费异化的特殊表现形式,而大数据推介系统则构成了网络消费中消费行为自由异化的技术诱因。人们的消费需求、消费心理、消费对象、消费环境异化等是导致网络消费异化问题的基本因素,而这些因素又共同构成了人们进行消费选择的前提条件,并由此导致了网络消费选择中符号化、同质化、被动化等消费行为自由异化的现象。网络消费作为满足人的消费需求的一种手段,基于现实需求的自由消费行为在大数据系统推介下产生了自由的异化,或者说成了一种受大数据推介技术所宰制的异化了的消费自由。在本质上,这种异化了的消费自由是一种消极的消费自由。因此,要在技术开发与实践过程中确立道德责任,促进技术应用者内在德性的养成,让消费者的消费行为建立在自决的判断和选择基础之上。\\n',\n",
       " 'SN 1000-2359\\n',\n",
       " 'CN 41-1011/C\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 孔浩;刘彬;\\n',\n",
       " 'AD 中国工商银行山东省分行金融科技部;\\n',\n",
       " 'T1 大数据分析助力银行网络运维转型发展\\n',\n",
       " 'JF 中国金融电脑\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 06\\n',\n",
       " 'OP 73-75\\n',\n",
       " 'K1 网络;数据;扁平化\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 近年来,各金融机构陆续开展网络扁平化改造,网络扁平化后如何对大量网点线路质量进行检测,对比分析各运营商专线质量,并通过有效手段提升网络线路稳定性成为网络管理工作的新课题。山东工行基于大数据分析手段,开发出一套用于解决金融网络扁平化模式下的网络线路分析系统和管理模式。该系统在山东工行实际投入使用后网络线路整体运行质量得到显著提高,运维复杂度得到有效降低,同时提升了网络管理标准化和自动化程度。\\n',\n",
       " 'SN 1001-0734\\n',\n",
       " 'CN 11-2623/F\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李震乾;\\n',\n",
       " 'AD 江西洪州职业学院;\\n',\n",
       " 'T1 大数据背景下计算机网络安全防范措施研究\\n',\n",
       " 'JF 科技与创新\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 11\\n',\n",
       " 'OP 108-109\\n',\n",
       " 'K1 大数据;计算机;网络安全;物联网\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 在大数据时代背景下,计算机网络已经成为中国人民日常生活中的重要部分,能够为中国人民的工作和学习带来诸多便利,但是在计算机网络系统的运行过程中,普遍存在各种各样的网络安全问题,无法保证计算机用户的信息安全,甚至会带来较大的损失。鉴于此,针对大数据背景下计算机网络安全存在的问题进行分析,并提出一些具体的防范措施,希望能为计算机网络安全工作提供一些有效参考。\\n',\n",
       " 'SN 2095-6835\\n',\n",
       " 'CN 14-1369/N\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 黄晓平;\\n',\n",
       " 'AD 肇庆市科技中等职业学校;\\n',\n",
       " 'T1 大数据时代计算机远程网络通信技术的应用研究\\n',\n",
       " 'JF 科学咨询(科技·管理)\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 06\\n',\n",
       " 'OP 227-228\\n',\n",
       " 'K1 大数据;计算机;远程网络;通信技术\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 在大数据时代的发展背景下,计算机远程网络通信技术的开发和应用程度越来越高,推动着我国信息化技术快速向前发展。本文针对大数据时代下计算机远程网络通信技术的具体应用展开全面分析和研究,对计算机网络通信技术使用存在的问题进行了阐述,同时对计算机远程网络通信技术的应用和创新工作进行了探索,以全面提高计算机远程网络通信技术的应用效果。\\n',\n",
       " 'SN 1671-4822\\n',\n",
       " 'CN 50-1143/N\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 武燕平;\\n',\n",
       " 'AD 江苏省连云港工贸高等职业技术学校;\\n',\n",
       " 'T1 大数据背景下的网络信息安全控制策略分析\\n',\n",
       " 'JF 产业与科技论坛\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 11\\n',\n",
       " 'vo 20\\n',\n",
       " 'OP 287-288\\n',\n",
       " 'K1 大数据;网络信息安全;控制策略\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 互联网的快速发展,网络给我们生活、工作带来便利,极大地提高工作效率。特别是大数据时代的到来,人们更加地依赖网络传输各类数据信息,同时,也产生了一系列的安全问题如数据信息非法盗取、网络病毒的传播等,给人们的工作、生活造成困扰。因此需要进一步加强大数据背景下网络信息安全问题控制策略的探究,从而为网络用户营造一个安全、稳定的网络工作环境。\\n',\n",
       " 'SN 1673-5641\\n',\n",
       " 'CN 13-1371/F\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 许妙水;\\n',\n",
       " 'AD 新中冠智能科技股份有限公司;\\n',\n",
       " 'T1 计算机网络中大数据与人工智能技术的应用\\n',\n",
       " 'JF 计算机与网络\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'vo 47\\n',\n",
       " 'OP 37\\n',\n",
       " 'K1 人工智能技术;网络安全事故;网络管理质量;技术的应用;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>随着计算机网络技术快速发展,工作和生活中的自动化水平变得更高,社会发展迈入了新的阶段。人工智能技术具有模拟人脑思维做出动作,以及通过编程自动发出指令的特性,将其和大数据运用到计算机网络中,可促进安全管理水平的提升,也有利于计算机网络系统的优化和管理。本文以计算机网络为对象,针对大数据与人工智能技术在其中的应用,进行深入探讨。当前计算机网络发展,已经成为一个国家发展水平的重要评判标准,所以应不断地研究、促进计算机网络进一步发展。人工智能技术可借助于虚拟技术,依照人的思维方式下达指令,代替人类完成工作。\\n',\n",
       " 'SN 1008-1739\\n',\n",
       " 'CN 13-1223/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 马颖;\\n',\n",
       " 'AD 新疆交通职业技术学院;\\n',\n",
       " 'T1 大数据时代的计算机网络安全防范策略\\n',\n",
       " 'JF 计算机与网络\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'vo 47\\n',\n",
       " 'OP 52\\n',\n",
       " 'K1 安全防范策略;网络安全问题;防火墙;大数据时代;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>随着社会的发展科技水平得日益提高,计算机早已在人们的生活中占据了重要地位,然而随着计算机网络中的数据量不断增多,很多网络问题便浮现出来,从而阻碍了计算机网络的平稳运行。本文对大数据时代的计算机网络安全进行了简要的探讨。大数据与计算机网络安全大数据的定义在日益进步的当代社会,人们的需求与以往大不相同。与传统互联网相比,大数据具有更大型的数据库,存储的数据信息也变得更多,大数据的出现使人们无论是工作还是生活,都有了很大的改变。\\n',\n",
       " 'SN 1008-1739\\n',\n",
       " 'CN 13-1223/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 刘博;邓舒平;杨楠;郑继辉;谢金龙;\\n',\n",
       " 'AD 云南电网有限责任公司玉溪供电局;云南电网有限责任公司;\\n',\n",
       " 'T1 智能网络下职业健康风险大数据分析方法\\n',\n",
       " 'JF 信息技术\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 128-134\\n',\n",
       " 'K1 职业健康;数据挖掘;AdaBoost算法;BP神经网络模型;可视化\\n',\n",
       " ' occupational health;data mining;AdaBoost algorithm;BP neural network model;visualization\\n',\n",
       " '\\n',\n",
       " 'AB 针对目前职业健康数据大、技术分析落后的问题,提出了新型的解决方法。该方法构建出包括数据获取层、数据存储层、数据处理层和数据分析层的系统架构,实现了职业健康大数据的采集、存储、计算和数据传递。该研究方法还采用大数据挖掘算法实现职业健康大数据的微观分析,通过AdaBoost算法实现不同健康大数据的关联分析,通过BP神经网络模型实现健康大数据的故障诊断,又采用可视化技术实现数据的集合与映射,提高职业健康大数据的管控,试验表明,该研究的方法数据处理速度快,准确率大于95%。\\n',\n",
       " 'SN 1009-2552\\n',\n",
       " 'CN 23-1557/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 陈辉彬;\\n',\n",
       " 'AD 北海职业学院;\\n',\n",
       " 'T1 大数据环境下的网络考试平台的开发及应用研究\\n',\n",
       " 'JF 电脑知识与技术\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 15\\n',\n",
       " 'vo 17\\n',\n",
       " 'OP 74-75\\n',\n",
       " 'K1 大数据环境;网络考试平台;开发应用\\n',\n",
       " ' big data environment;network examination platform;development and application\\n',\n",
       " '\\n',\n",
       " 'AB 该文针对大数据环境下,网络考试平台的开发措施,从基础性设计、应用性开发、数据建设质量,三方面展开探讨总结;并针对网络考试平台的应用措施,从题库管理、试卷管理、考试管理以及成绩管理,这四个方面进行探究分析,以期能够为网络考试平台的高效应用,提供参考性建议。\\n',\n",
       " 'SN 1009-3044\\n',\n",
       " 'CN 34-1205/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李新新;\\n',\n",
       " 'AD 廊坊市市场监督管理局;\\n',\n",
       " 'T1 大数据技术在网络入侵检测的应用\\n',\n",
       " 'JF 信息技术与信息化\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 235-237\\n',\n",
       " 'K1 大数据;数据挖掘;网络入侵检测;病毒\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 针对大数据技术在网络入侵检测的应用,采用理论结合实践的方法,先分析了目前网络入侵检测发展现状,接着探讨了常见的网络入侵方式,最后分析大数据挖掘技术在网络入侵检测的应用要点和网络入侵检测系统的性能测试。分析结果表明,将大数据应用到网络入侵检测中,可有效防止病毒、黑客、拒绝服务等对计算机网络系统造成危害和影响,从而保证网络系统中数据的安全性。\\n',\n",
       " 'SN 1672-9528\\n',\n",
       " 'CN 37-1423/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李鹏举;\\n',\n",
       " 'AD 中国联合网络通信有限公司邯郸市分公司;\\n',\n",
       " 'T1 简析大数据背景下信息通信网络安全管理策略\\n',\n",
       " 'JF 数字技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'vo 39\\n',\n",
       " 'OP 184-186\\n',\n",
       " 'K1 大数据技术;信息通信;网络安全;管理策略\\n',\n",
       " ' Big data technology;Information communication;Network security;Management strategy\\n',\n",
       " '\\n',\n",
       " 'AB 在互联网大数据高速发展的现阶段,电子政务管理系统成为地方政府提高决策效率,精准快速下达相关政策的重要工具。电子政务系统主要利用了大数据进行系统分析,发挥出互联网数据技术应用的优势,建设了系统的体系。笔者在本文中主要就在电子政务管理盛行的今天,有关部门应该怎样对网络安全进行有效的管理。\\n',\n",
       " 'SN 1007-9416\\n',\n",
       " 'CN 12-1369/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 格桑次仁;\\n',\n",
       " 'AD 西藏职业技术学院;\\n',\n",
       " 'T1 大数据背景下计算机信息技术在网络安全中的运用探析\\n',\n",
       " 'JF 数字技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'vo 39\\n',\n",
       " 'OP 190-192\\n',\n",
       " 'K1 大数据;计算机;信息技术;网络安全\\n',\n",
       " ' Big data;Computer;Information technology;Network security\\n',\n",
       " '\\n',\n",
       " 'AB 随着计算机信息技术的快速发展,\"大数据\"概念随之出现。\"大数据\"对人们生产生活的影响越来越深,同时相应的网络安全问题也亟待解决。基于此,本文分析了在\"大数据\"的背景下危害网络安全的因素,研究了在\"大数据\"的背景下计算机信息技术在网络安全中的应用,以供参考。\\n',\n",
       " 'SN 1007-9416\\n',\n",
       " 'CN 12-1369/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 郑昕;\\n',\n",
       " 'AD 广州达智教育管理有限公司;\\n',\n",
       " 'T1 大数据背景下网络营销对策\\n',\n",
       " 'JF 营销界\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 21\\n',\n",
       " 'OP 5-6\\n',\n",
       " 'K1 网络营销;沃尔玛;大数据时代;大数据背景下;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>随着时代的发展,社会的进步,经济的迅速攀升,我国在各个领域都出现了变革与优化,尤其在大数据方面,获得了不小的成就。反之大数据逐渐改变了人们的生活、学习、工作等多个方面,在大数据的衍生下,网络营销随之出现;相比传统式的营销模式来看,网络营销并没有突破传统式营造模式所带来的营销弊端,所以只能说我国在营销方面的形式有所进步,但在营销内容方面还有待创新,那么如何提升网络营销在现今整体营销中的重要性,是当前大数据时代下。我们必须要考虑的问题。因此本文重点以大数据背景下网络营销对策,展开相关探讨。\\n',\n",
       " 'CN 41-1405/F\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 白贺伊;\\n',\n",
       " 'AD 西安广播电视大学;\\n',\n",
       " 'T1 基于卷积神经网络的健康大数据智能分析方法研究\\n',\n",
       " 'JF 电子设计工程\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'vo 29\\n',\n",
       " 'OP 10-14\\n',\n",
       " 'K1 卷积神经网络;词向量;医疗数据;大数据分析;疾病风险评估\\n',\n",
       " ' convolutional neural network;word vector;medical data;big data analysis;disease risk assessment\\n',\n",
       " '\\n',\n",
       " 'AB 针对充分挖掘医疗健康大数据中有效信息不深入,智能化分析平台功能开发受限等问题,文中基于卷积神经网络,提出了一种适用于对医疗健康大数据进行智能化分析的方法。该方法通过分布式表示法对医疗文本数据进行数字化处理,得到相应特征的词向量表示,利用卷积神经网络不断训练与学习,得到不同数据集对应各个疾病的分析模型,再利用该模型完成对患者数据的智能分析与风险评估。实验结果表明,文中方法能够完成对多种疾病的风险评估,尤其对一般疾病数据集风险评估的准确率均可达到90%以上,验证了该方法的有效性、可靠性与通用性。\\n',\n",
       " 'SN 1674-6236\\n',\n",
       " 'CN 61-1477/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李培培;\\n',\n",
       " 'AD 郑州旅游职业学院;\\n',\n",
       " 'T1 大数据与计算机网络的信息安全策略分析\\n',\n",
       " 'JF 电子技术\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'vo 50\\n',\n",
       " 'OP 110-111\\n',\n",
       " 'K1 大数据;计算机网络;信息安全\\n',\n",
       " ' big data;computer network;information security\\n',\n",
       " '\\n',\n",
       " 'AB 阐述基于大数据的计算机网络信息系统遇到的安全问题,并提出应对措施,包括计算机系统中设置防火墙、有效的防护程序应用、监控计算机系统中的网络数据,从而保障网络信息的安全。\\n',\n",
       " 'SN 1000-0755\\n',\n",
       " 'CN 31-1323/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 潘继财;\\n',\n",
       " 'AD 中国科学技术信息研究所;\\n',\n",
       " 'T1 大数据样本与半监督环境下基于生成对抗网络的故障诊断\\n',\n",
       " 'JF 机械与电子\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'vo 39\\n',\n",
       " 'OP 20-25\\n',\n",
       " 'K1 大数据样本;半监督;生成对抗网络;梯度函数;分类诊断\\n',\n",
       " ' big data sample;semi-supervision;generation countermeasure network;gradient function;classification diagnosis\\n',\n",
       " '\\n',\n",
       " 'AB 在大故障样本条件下,提出一种基于生成对抗网络模型的故障诊断方法研究。构建生成对抗网络模型,保证模型判别器输出数据的总体分布与原始故障集趋同,并基于空间测量工具对梯度函数进行优化,降低损失;采用故障集图像转换方式实现对原始信号的降维处理,利用判别器的神经网络结构训练输入数据,并提取出机械故障数据集中的故障特征点。实验结果表明,提出方法具有良好的分类诊断性能,故障诊断精度能够达到99.45%。\\n',\n",
       " 'SN 1001-2257\\n',\n",
       " 'CN 52-1052/TH\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李文;张珍珍;梅蕾;\\n',\n",
       " 'AD 内蒙古科技大学经济与管理学院;\\n',\n",
       " 'T1 企业网络、大数据能力与商业模式创新机制研究——基于fs QCA方法的实证分析\\n',\n",
       " 'JF 科技进步与对策\\n',\n",
       " 'OP 1-10\\n',\n",
       " 'K1 企业网络;大数据能力;商业模式创新;定性比较分析\\n',\n",
       " ' EnterpriseNetwork;BigDataCapability;BusinessModelInnovation;QCA\\n',\n",
       " '\\n',\n",
       " 'AB 商业模式创新是企业竞争优势的重要来源,在当前激烈的竞争环境下,企业间竞争不仅是产品竞争,更是商业模式竞争。基于组态视角和集合论思想,从企业网络与大数据能力匹配视角,运用模糊集定性比较分析fs QCA方法,对15家新零售企业商业模式创新案例进行研究,构建新零售企业商业模式创新匹配模型。结果发现,有4类促进新零售企业商业模式创新的牵引条件构型:网络体系建立助力型、资源整合能力促进型、深度分析能力弥补型和信息资源共享推动型,且每条路径间存在等效性。结论丰富了商业模式创新领域研究,可为企业实施商业模式创新提供理论支持和借鉴。\\n',\n",
       " 'SN 1001-7348\\n',\n",
       " 'CN 42-1224/G3\\n',\n",
       " 'LA 中文\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 曹仰之;\\n',\n",
       " 'AD 东莞职业技术学院;\\n',\n",
       " 'T1 基于大数据的计算机网络信息安全防护措施研究\\n',\n",
       " 'JF 电脑编程技巧与维护\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 167-168\\n',\n",
       " 'K1 大数据;信息安全;防护墙;双入侵检测\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 为了在大数据环境下打造数据信息安全防护体系,选取防火墙技术和入侵检测技术作为安全防护布设工具,针对计算机遭受网络攻击问题,拟定防护墙、双入侵检测网络安全防护措施。实践应用结果表明,防护墙与双入侵检测共同应用方案较传统安全防护方案的信息防护效果有了明显提升。\\n',\n",
       " 'SN 1006-4052\\n',\n",
       " 'CN 11-3411/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'T1 广电总局制定网络视听收视大数据行业标准播放数据将有统一标准\\n',\n",
       " 'JF 中国有线电视\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 490\\n',\n",
       " 'K1 网络视听;广电总局;统一标准;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>广电总局公布了\"国家广播电视总局科技司关于对《网络视听收视大数据技术规范第1部分:总体要求》等四项广播电视和网络视听行业标准报批稿进行公示的通知,公示中表明,广电总局对网络视听收视大数据制定了行业标准,网剧和网综的播放数据将有统一标准。\\n',\n",
       " 'SN 1007-7022\\n',\n",
       " 'CN 61-1309/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 陈伟;\\n',\n",
       " 'AD 贵州大学科技学院;\\n',\n",
       " 'T1 大数据时代计算机网络信息安全及防护策略探究\\n',\n",
       " 'JF 电子世界\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 09\\n',\n",
       " 'OP 10-11\\n',\n",
       " 'K1 网络信息安全;网络安全问题;杀毒软件;大数据时代;策略探究;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>如今,互联网已经发展到大数据时代,互联网保存了绝大部分人的隐私信息,这些信息一旦被泄露,将会给个人和企业都会带来巨大损失,甚至会成为间谍盗取国家机密的主要渠道。如何预防网络信息泄露、维护网络安全是目前需要解决的首要问题。\\n',\n",
       " 'SN 1003-0522\\n',\n",
       " 'CN 11-2086/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 郁陶;\\n',\n",
       " 'AD 德州职业技术学院;\\n',\n",
       " 'T1 大数据时代人工智能在计算机网络技术中的应用研究\\n',\n",
       " 'JF 电子世界\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 09\\n',\n",
       " 'OP 50-51\\n',\n",
       " 'K1 人工智能;数据库;专家知识库;人工神经网络;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>新兴技术一直都是计算机网络技术不断发展的强大驱动力,包括大数据、云计算、VR、AR和人工智能在内的多种新兴技术在计算机网络领域中的广泛应用,给网络用户带来了丰富的新体验。本文立足于大数据时代背景,分析了大数据与人工智能的关系,\\n',\n",
       " 'SN 1003-0522\\n',\n",
       " 'CN 11-2086/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 高慧;\\n',\n",
       " 'AD 新乡学院;\\n',\n",
       " 'T1 基于大数据的网络舆情多维动态分类研究\\n',\n",
       " 'JF 电脑知识与技术\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 14\\n',\n",
       " 'vo 17\\n',\n",
       " 'OP 15-17\\n',\n",
       " 'K1 大数据;网络舆情;多维;动态分类\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 由于网络舆情多维动态实际分类中,分类结果与实际情况存在一定误差,比值比(odds ratio,OR值)较小,为此提出基于大数据的网络舆情多维动态分类研究。通过对网络舆情概念、网络舆情特点等进行分析,构建网络舆情多维动态分类指标体系、基于大数据的事件类型多维度指标聚类分析、网络舆情数据分类判别,提出一种全新的分类方法。通过对比实验证明,该分类方法OR值明显增加,说明网络舆情多维动态分类结果与实际情况更接近,分类更加精确。\\n',\n",
       " 'SN 1009-3044\\n',\n",
       " 'CN 34-1205/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 王珊珊;梁同乐;\\n',\n",
       " 'AD 广东轻工职业技术学院信息技术学院;广东邮电职业技术学院计算机学院;\\n',\n",
       " 'T1 基于大数据技术的网络热搜关键词提取算法\\n',\n",
       " 'JF 电子测试\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'OP 48-49+97\\n',\n",
       " 'K1 大数据技术;网络热搜;关键词;提取算法\\n',\n",
       " ' big data technology;network hot search;keywords;extraction algorithm\\n',\n",
       " '\\n',\n",
       " 'AB 传统的网络热搜关键词提取方法查全率低,无法满足使用者的需求。因此,提出基于大数据技术的网络热搜关键词提取算法。确定网络热搜关键词特征的模糊空间,基于大数据加权融合网络热搜关键词,采用大数据技术Reduce中的稀疏表示技巧,实现网络热搜关键词提取。实验结果表明,实验组测得的查全率高于对照组两倍以上,可以弥补传统网络热搜关键词提取算法中存在的不足。\\n',\n",
       " 'SN 1000-8519\\n',\n",
       " 'CN 11-3927/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李晓霞;\\n',\n",
       " 'AD 淄博职业学院;\\n',\n",
       " 'T1 基于大数据时代人工智能在计算机网络技术中的应用\\n',\n",
       " 'JF 电子测试\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'OP 133-134\\n',\n",
       " 'K1 大数据;人工智能;网络技术;应用\\n',\n",
       " ' big data;artificial intelligence;network technology;application\\n',\n",
       " '\\n',\n",
       " 'AB 在这个大数据发展时代下,随着当前我国人工智能网络信息技术的不断创新和技术进步,为我国计算机网络信息技术的广泛应用发展,提供了更大的技术发展空间。在此课题研究基础上,深入人工智能在当前我国计算机学和人工智能技术中的应用,以及科学研究中的发展前景,进行了全面的学术研究。\\n',\n",
       " 'SN 1000-8519\\n',\n",
       " 'CN 11-3927/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 毛莉艳;\\n',\n",
       " 'AD 国家计算机网络应急技术处理协调中心广东分中心;\\n',\n",
       " 'T1 大数据技术在通信网络中的应用\\n',\n",
       " 'JF 电子技术与软件工程\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'OP 3-4\\n',\n",
       " 'K1 大数据技术;通信网络;云计算\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 本文首先分析了大数据技术在通信网络中的应用优势,其次对大数据技术在通信网络中的应用措施和现状进行了研究,在此基础上探索了大数据技术在通信网络应用存在的主要问题,并针对这些问题提出相应的解决方案。\\n',\n",
       " 'SN 2095-5650\\n',\n",
       " 'CN 10-1108/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 王玲玲;\\n',\n",
       " 'AD 德州职业技术学院;\\n',\n",
       " 'T1 计算机大数据分析与云计算网络技术应用研究\\n',\n",
       " 'JF 电子技术与软件工程\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'OP 154-155\\n',\n",
       " 'K1 计算机;大数据;云计算;网络技术\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 本文研究了计算机大数据分析和云计算网络技术,对于这两种相关联的技术进行深入分析,研究计算机大数据分析和云计算技术的具体应用情况。\\n',\n",
       " 'SN 2095-5650\\n',\n",
       " 'CN 10-1108/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李晓磊;李志辉;\\n',\n",
       " 'AD 周口广播电视台;\\n',\n",
       " 'T1 县市台大数据网络融媒体应用研究\\n',\n",
       " 'JF 影视制作\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'vo 27\\n',\n",
       " 'OP 70-74\\n',\n",
       " 'K1 融媒体;APP;手机台;大数据平台\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 本文主要介绍周口广播电视台推行的\"一市一中心,一县一平台,一乡一网站,一村一公号\"的大数据融媒体平台的应用,该平台以混合云(公有云+私有云)平台框架来布局,搭建市、县、乡三级平台,以此融合广播电视、新闻、党建、大数据、政务等服务,建成统一的运营平台,为用户构建云服务。多用户可以通过统一平台实现通用功能,同时用户可以通过融媒体平台实现手机台APP、微博、微信交互联网发布信息,政务系统和智慧城市系统也可以在大数据平台上交互运行,从而实现各种业务系统的对接。\\n',\n",
       " 'SN 1673-5218\\n',\n",
       " 'CN 11-5863/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李晓磊;赵宇;\\n',\n",
       " 'AD 河南周口广播电视台;河南周口职业技术学院;\\n',\n",
       " 'T1 县市级大数据网络融媒体平台应用研究\\n',\n",
       " 'JF 广播与电视技术\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'vo 48\\n',\n",
       " 'OP 69-72\\n',\n",
       " 'K1 融媒体;APP;手机台;大数据平台\\n',\n",
       " ' Converged media;APP;Mobile phone station;Big data platform\\n',\n",
       " '\\n',\n",
       " 'AB 打造融媒体中心,构建什么样的技术平台尤为重要。传统媒体已经无法满足人们对信息量快速传播的需求,传统媒体与新媒体融合就是应对需求的创新之举。本文认为在大数据的支持下,建设全媒体应用平台,以新媒体APP应用为依托整合系统架构,更有助于二者发挥独一无二的作用。\\n',\n",
       " 'SN 1002-4522\\n',\n",
       " 'CN 11-1659/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 莫靖聪;\\n',\n",
       " 'AD 桂林航天工业学院管理学院;\\n',\n",
       " 'T1 大数据背景下高校网络思想政治教育的安全风险对策研究\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 101-103\\n',\n",
       " 'K1 大数据;高校;思想政治教育;网络安全\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 大数据背景下,高校的网络思想政治教育存在诸多安全风险,这些安全风险具有较强的隐蔽性、难控性和复杂性。大量的网络数据让高校网络思想政治教育存在安全意识不到位、信息分类不限制、工作队伍不专业的问题。所以,高校要有效解决网络思想政治教育存在的安全风险,要加强顶层领导,提高网络思想政治教育安全意识;建立安全监管制度,规范网络安全使用规范;完善人才队伍建设,落实网络思想政治教育安全的底线思维。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 张玲玲;\\n',\n",
       " 'AD 山西铁道职业技术学院;\\n',\n",
       " 'T1 探讨大数据视域下的高校网络安全课程教学改革创新\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 114-115\\n',\n",
       " 'K1 大数据;高校;网络安全课程;教学改革;创新路径\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 随着大数据时代的来临,网络已经渗透到生活中的各个角落,社会网络安全频发,公民信息泄露频发等问题已成为当前互联网治理的重点。因此在高校中开展网络安全课程教育,如何推进高校网络安全课程改革,加快培育高素质网络安全人才,补齐社会对网络人才的需求缺口已成为当前社会亟待解决的重要课题。基于此,本文基于大数据视域下,探析了高校网络安教学改革创新的具体路径,以期为相关研究提供些许思路。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 王晓娜;李晓宇;李芙蓉;\\n',\n",
       " 'AD 北京北信源软件股份有限公司;\\n',\n",
       " 'T1 人工智能及大数据的网络安全态势感知研究\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 73-74\\n',\n",
       " 'K1 人工智能;大数据;网络安全;态势感知\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 企业生产运营中,面临的信息安全威胁比较大,安全攻击技术呈现多元化发展趋势。企业应当积极防范风险,通过科学措施,确保网络安全性,同时提升信息防护能力,以免企业受到安全威胁与攻击,维护企业信息安全与隐私安全,规避风险损失。此次研究基于大数据技术和人工智能技术,分析网络安全态势感知,仅供参考。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 董颖;\\n',\n",
       " 'AD 北京工业大学经济与管理学院;\\n',\n",
       " 'T1 大数据时代的网络黑客攻击与防范治理\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 68-70\\n',\n",
       " 'K1 大数据时代;网络安全;黑客攻击;防范治理\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 本文介绍了黑客攻击的基本流程,并基于大数据时代背景,分析黑客攻击在攻击手段、攻击方式、攻击范围和攻击心理四个方面呈现出的新特点,从安全管理、软件维护、体系构建、意识心理四个方面提出针对黑客攻击的有效防范治理措施。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 席攀锋;\\n',\n",
       " 'AD 甘肃建筑职业技术学院;\\n',\n",
       " 'T1 大数据时代计算机网络信息安全研究\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 70-71\\n',\n",
       " 'K1 大数据时代;计算机网络;信息安全\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 大数据属于海量数据信息整合、处理、计算的主要技术载体,其中包含着多元化的数据结构,更新速度很快,运行成本也较低,数据类型多种多样,甚至成为经济战略目标树立与落实的主要方向。但是,在大数据时代下计算机网络信息安全问题逐渐增多,如果不能合理进行安全的管控,将会对大数据时代下的计算机网络系统安全运行、稳定发展造成不利影响。因此,在大数据时代环境中应重点开展计算机网络信息安全管理工作、安全控制工作,借助先进技术维护计算机网络的安全性,争取可以在大数据时代下提升计算机网络系统运行的安全水平,为网络系统的后续良好使用夯实基础。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 马天午;\\n',\n",
       " 'AD 河北兰科网络工程集团有限公司;\\n',\n",
       " 'T1 大数据背景下计算机网络信息安全探究\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 157-159\\n',\n",
       " 'K1 大数据;计算机网络系统;网络信息安全\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 随着我国时代的发展,我国的信息技术水平得到了一定的进步与发展,计算机网络被广泛应用在各个方面。但随着它的广泛应用,它在实际应用当中也存在着一系列的安全问题,其中以计算机网络信息安全为主。对于计算机网络系统而言,网络信息在其中起着非常重要的作用,因此在大数据的背景下如何保证计算机网络信息安全,成了相关工作人员最应当重视的问题。因此,本文通过分析加强和保障计算机网络信息安全的一系列措施与方法以促进计算机网络系统的进步与发展。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 陈亚科;\\n',\n",
       " 'AD 煤炭科学技术研究院有限公司;\\n',\n",
       " 'T1 基于大数据时代下的计算机网络安全研究\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 159-161\\n',\n",
       " 'K1 大数据;计算机网络;网络安全态势感知\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 本文提出了与计算机网络安全相关的一种安全防御技术,即基于大数据背景的网络安全态势感知,其从感知系统的架构模型到数据预处理、从量化感知到动态预测,对于网络来说都能起到一定的安全保障作用,并符合当下大数据时代发展背景,特别针对异构数据源来说更能起到准确数据分析及预处理的作用。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 童瀛;姚焕章;周宇;\\n',\n",
       " 'AD 江苏省公安厅;\\n',\n",
       " 'T1 大数据背景下网络信息安全技术体系分析\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 67-68\\n',\n",
       " 'K1 大数据背景;网络信息安全;技术体系\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 近几年来,在我国网络数字化信息技术不断完善和进一步发展下,网络信息技术得到各个行业领域的认可和应用,网络信息技术也逐渐渗透到人们实际日常生活中,网络信息技术为人们日常生活和工作方面都带来了极大的便利。互联网通信技术随之也有进一步发展提升,对社会未来发展和进步起到推动作用,然而在网络信息技术不断发展中,还存在诸多问题,现代化社会处于大数据背景下,社会群众越来越关注网络信息安全问题,基于此,应该积极探究能够有效保障网络信息安全的办法,构建完善的网络信息安全技术体系,相关工作人员积极掌握了解网络信息技术中存在的问题,采用科学有效的解决办法,将网络信息中的安全隐患进行集中处理,从而有效的提升网络信息安全的安全性,促进我国社会科技未来可持续发展。本文针对大数据背景下网络信息安全技术体系进行深层次的探究分析,希望为构建完善的网络信息安全技术体系提供有效的理论依据。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 郑志荣;\\n',\n",
       " 'AD 西安汽车职业大学;\\n',\n",
       " 'T1 大数据系统中的计算机网络安全技术\\n',\n",
       " 'JF 网络安全技术与应用\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 71-73\\n',\n",
       " 'K1 大数据系统;计算机;网络安全技术\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 为了提高大数据系统的运行性能,保证信息数据传输和存储的可靠性和安全性,现针对计算机网络存在黑客、病毒、软件隐患等安全问题,在科学应用计算机网络安全技术的基础上,构建和设计出功能完善、实用性强的网络安全系统,确保计算机网络能够可靠、稳定、安全地运行,从而提高网络信息数据的保密性和安全性,为促进大数据系统的健康、可持续发展提供重要平台支持。\\n',\n",
       " 'SN 1009-6833\\n',\n",
       " 'CN 11-4522/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 马颖;\\n',\n",
       " 'AD 新疆交通职业技术学院;\\n',\n",
       " 'T1 基于大数据的计算机网络数据库安全技术\\n',\n",
       " 'JF 计算机与网络\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 09\\n',\n",
       " 'vo 47\\n',\n",
       " 'OP 51\\n',\n",
       " 'K1 数据库安全技术;使用权限;病毒代码;\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB <正>随着国家科技实力与经济实力的不断增长,我国也开启了新型的大数据时代。为了随时搜索、查看和应用这些规模庞大的数据,数据库也走入了各个行业之中。互联网与网上平台为无数网络用户提供了便利的数据查找服务,并以一个全新的面貌实现了大数据共享。但计算机网络环境从始至终都是复杂且未知的,所以基于网络的数据库也处于一个危险且脆弱的环境之中,如何维护数据库的安全是计算机网络安全领域中的重要问题。\\n',\n",
       " 'SN 1008-1739\\n',\n",
       " 'CN 13-1223/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 李智峰;\\n',\n",
       " 'AD 广东南方电信规划咨询设计院有限公司惠州分公司;\\n',\n",
       " 'T1 基于网格化和大数据的移动网络覆盖质量评估方法研究\\n',\n",
       " 'JF 无线互联科技\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 09\\n',\n",
       " 'vo 18\\n',\n",
       " 'OP 24-25\\n',\n",
       " 'K1 网格;移动网络覆盖质量;大数据;MR用户数据\\n',\n",
       " ' grid;mobile network coverage quality;Big Data;MR user data\\n',\n",
       " '\\n',\n",
       " 'AB 文章主要探讨了河源电信的4G及5G网络规划建设过程,研究运用大数据等各种工具全面分析移动网络覆盖质量,并以营销中心为目标,细分网格化管理运营,与市场线条形成良性互动,最大限度地提升资源投放效益,为各县区营销中心有效赋能,提升用户感知NPS的综合方法。\\n',\n",
       " 'SN 1672-6944\\n',\n",
       " 'CN 32-1675/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 张鑫;\\n',\n",
       " 'AD 黑龙江科技大学管理学院;\\n',\n",
       " 'T1 大数据支持下网络谣言智慧治理研究\\n',\n",
       " 'JF 合作经济与科技\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 10\\n',\n",
       " 'OP 178-179\\n',\n",
       " 'K1 大数据支持;大数据技术;网络谣言;智慧治理\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 基于大数据技术的网络谣言智慧治理是一个需要不断完善的新命题,是面对信息传播的新技术、新背景、新条件下的有力手段和有益探索。通过梳理网络谣言智慧治理的相关研究,厘清其逻辑内涵与理论根源,阐释大数据环境下网络谣言的鲜明特征,并提出大数据技术支持下的网络谣言智慧治理的优势及实现路径。\\n',\n",
       " 'SN 1672-190X\\n',\n",
       " 'CN 13-1296/N\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 徐选华;余紫昕;\\n',\n",
       " 'AD 中南大学商学院;\\n',\n",
       " 'T1 社会网络环境下基于公众行为大数据属性挖掘的大群体应急决策方法及应用\\n',\n",
       " 'JF 控制与决策\\n',\n",
       " 'OP 1-10\\n',\n",
       " 'K1 社会网络分析;公众行为大数据;属性挖掘;大群体;应急决策\\n',\n",
       " ' social network analysis;public behavior big data;attribute mining;big group;emergency decision-making\\n',\n",
       " '\\n',\n",
       " 'AB 针对社会网络环境下复杂大群体应急决策中决策属性信息难以获得问题,提出了社会网络环境下公众行为大数据驱动的大群体应急决策方法。首先,通过挖掘社交平台上的公众行为大数据,利用TF-IDF、Word2vec技术进行关键词提取、聚类及其影响力分析,从大量行为数据中挖掘大群体决策属性信息以辅助专家决策,使决策结果具有更高的科学性和有效性。其次,构建决策者间基于信任关系和观点相似度的社会网络,采用同时考虑信任和相似度的聚类方法对决策者进行聚类,并基于社会网络分析获得决策者权重;然后,提出基于决策者间信任关系的共识调整方法进行共识调整以获得最终群体决策矩阵和方案排序,通过引入决策者客观自信度避免个别决策者过分自信行为的影响。最后,通过一个新冠疫情案例分析说明了方法的可行性和有效性。\\n',\n",
       " 'SN 1001-0920\\n',\n",
       " 'CN 21-1124/TP\\n',\n",
       " 'LA 中文\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 华磊;\\n',\n",
       " 'AD 江苏春申律师事务所;\\n',\n",
       " 'T1 大数据时代网络犯罪的刑法应对\\n',\n",
       " 'JF 法制与社会\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 13\\n',\n",
       " 'OP 125-126\\n',\n",
       " 'K1 大数据时代;网络犯罪;人工智能\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 发达的网络技术的确为人们的生活提供了方便,在网络技术的帮助下,民众的生产、生活所需都能得到满足。但是这项新的技术得到发展之后,网络犯罪问题也就衍生出来了,网络犯罪是一种新的犯罪类型,它对社会的危害性非常大,如果没有有效的应对方法,人民群众的生命、财产安全会遭受巨大的威胁。从行业内反馈的情况来看,在大数据的时代背景之下,针对网络犯罪还没有有效的应对机制,网络安全法益出现了保护失衡的问题。对于有关部门来说,要充分利用大数据时代的特点,建立人工智能犯罪规制,减少社会上的网络犯罪的发生概率。\\n',\n",
       " 'SN 1009-0592\\n',\n",
       " 'CN 53-1095/D\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 蔡林;\\n',\n",
       " 'AD 中国移动通信集团贵州有限公司网络部网优中心;\\n',\n",
       " 'T1 基于jupyter的大数据分析工具在网络优化领域的应用研究\\n',\n",
       " 'JF 中国新通信\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 09\\n',\n",
       " 'vo 23\\n',\n",
       " 'OP 92-93\\n',\n",
       " 'K1 大数据;Jupyter Notebook;Hadoop;Spark;分布式计算;网络优化\\n',\n",
       " ' \\n',\n",
       " '\\n',\n",
       " 'AB 目的:介绍Jupyter Notebook在网络优化领域的应用情况。方法:集成Hadoop、Spark、Jupyter Notebook 等开源工具,搭建网络优化分析平台,基于真实案例验证其在网络优化领域应用的可行性。结果:通过搭建大数据计算环境,成功实现多数据接入、分布式运算、分布式存储、交互式应用及结果展示等功能,并基于该平台完成网络整体问题分析、问题原因定位分析、问题处理方案分析、问题处理效果分析等大数据分析任务。结论:结合网络优化的大数据分析需求,搭建便于使用的大数据分析环境,提升基于大数据的网络优化分析能力。\\n',\n",
       " 'SN 1673-4866\\n',\n",
       " 'CN 11-5402/TN\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 杨文学;\\n',\n",
       " 'AD 北京交通运输职业学院交通管理与信息工程系;\\n',\n",
       " 'T1 大数据时代下人工智能在计算机网络技术中的运用探讨\\n',\n",
       " 'JF 电脑知识与技术\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 13\\n',\n",
       " 'vo 17\\n',\n",
       " 'OP 188-190\\n',\n",
       " 'K1 大数据时代;人工智能;计算机网络技术\\n',\n",
       " ' big data era;artificial intelligence;computer network technology\\n',\n",
       " '\\n',\n",
       " 'AB 在现代信息科技快发展的过程中,人工智能逐渐呈现出多元的发展趋势,能够有效地提高计算机网络技术的稳定性和智能性,满足社会大众对海量数据的应用需求。而借助人工智能技术,处理和优化信息数据,可以充分地为我国计算机网络技术的发展奠定坚实的理论基础,提升计算机网络技术的应用成效。对此,本文结合人工智能和大数据的理论内涵,探析计算机网络技术中人工智能的应用优势和必要性,提出相应的应用策略。\\n',\n",
       " 'SN 1009-3044\\n',\n",
       " 'CN 34-1205/TP\\n',\n",
       " 'LA 中文;\\n',\n",
       " 'DS CNKI\\n',\n",
       " '\\n',\n",
       " 'RT Journal Article\\n',\n",
       " 'SR 1\\n',\n",
       " 'A1 陈丹妮;李晓蝶;李念;蒋元衡;欧吉军;\\n',\n",
       " 'AD 南京审计大学金审学院;\\n',\n",
       " 'T1 大数据模型下网络直播平台违约金合理性研究\\n',\n",
       " 'JF 中小企业管理与科技(上旬刊)\\n',\n",
       " 'YR 2021\\n',\n",
       " 'IS 05\\n',\n",
       " 'OP 138-139\\n',\n",
       " 'K1 资产评估;网络直播;损失\\n',\n",
       " ' asset assessment;live streaming;loss\\n',\n",
       " '\\n',\n",
       " 'AB 近年来,网络直播成为互联网时代兴起的热点话题,论文选取斗鱼、淘宝、抖音三个平台所属案例作为研究对象,以资产评估相关知识作为研究基础,从平台流量粉丝及线上销售获益两方面研究网络直播平台设定合同违约金的合理性,对直播平台合同违约金如何设置提出有效的建议。\\n',\n",
       " 'SN 1673-1069\\n',\n",
       " ...]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "with open('D:/CNKI/CNKI-20210702130438058.txt', encoding='utf-8') as f:\n",
    "    display(f.readlines())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.3"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
